Download the dataset

data <- readRDS("C:/Users/enami/Downloads/very_low_birthweight.RDS")

Find and delete all NAs in columns

na_counts <- colSums(is.na(data))
data_nona <- data[, na_counts <= 100]

And now in rows

data_clean <- na.omit(data_nona)

Lets do the numeric variables density plots

numeric_v <- data_clean %>% select(where(is.numeric))
par(mfrow = c(3, 3)) 
for (var in names(numeric_v)) {
  plot(density(numeric_v[[var]], na.rm = TRUE),
       main = paste("Плотность для", var),
       xlab = var,
       ylab = "Плотность")
}

IQR=Q3−Q1 Нижняя:

Q1−1.5⋅IQR Верхняя:

Q3+1.5⋅IQR

remove_outlier <- function(data, var) {
  q <- quantile(data[[var]], probs = c(0.25, 0.75), na.rm = TRUE)
  iqr <- q[2] - q[1]
  lower <- q[1] - 1.5 * iqr
  upper <- q[2] + 1.5 * iqr
  data %>% filter(data[[var]] >= lower, data[[var]] <= upper)
}
####the function on top is supposed to remove outliers based on IQR
data_nooutlier <- numeric_v
for (var in names(data_nooutlier)) {
  data_nooutlier <- remove_outlier(data_nooutlier, var)
}

Lets do categorical transformation

categorical_v <- data_clean %>% select(where(is.character))
categorical_v <- categorical_v %>% mutate(across(everything(), as.factor))

Graph for two numeric..?

data_clean <- data_clean %>%
  mutate(dead = as.factor(dead), pneumo = as.factor(pneumo), inout = as.factor(inout))
ggplot(data = data_clean, aes(x = pneumo, fill = inout)) +
  geom_bar(position = "dodge", aes(y = ..count..)) +
  facet_wrap(~ dead, labeller = labeller(dead = c("0" = "Выжившие", "1" = "Умершие"))) +
  theme_minimal() +
  labs(
    title = "Распределение пневмонии по inout и статусу выживания",
    x = "Наличие пневмонии",
    y = "Количество случаев",
    fill = "In/Out"
  )
## Warning: The dot-dot notation (`..count..`) was deprecated in ggplot2 3.4.0.
## ℹ Please use `after_stat(count)` instead.
## This warning is displayed once every 8 hours.
## Call `lifecycle::last_lifecycle_warnings()` to see where this warning was
## generated.

Please, dont kill me but i will check normality probably

data_clean %>%
  group_by(inout) %>%
  summarise(shapiro = list(shapiro_test(lowph))) %>%
  unnest(shapiro)
## # A tibble: 2 × 4
##   inout        variable statistic       p.value
##   <fct>        <chr>        <dbl>         <dbl>
## 1 born at Duke lowph        0.965 0.00000000758
## 2 transported  lowph        0.965 0.0228
test <- wilcox_test(data_clean, lowph ~ inout)
test
## # A tibble: 1 × 7
##   .y.   group1       group2         n1    n2 statistic            p
## * <chr> <chr>        <chr>       <int> <int>     <dbl>        <dbl>
## 1 lowph born at Duke transported   448    83    25630. 0.0000000417
data_clean %>%
  ggplot(aes(x = inout, y = lowph, color = inout)) +
  geom_boxplot() +
  stat_compare_means(method = "wilcox.test", label = "p.signif")

rstatixplot

library(rstatix)
ggboxplot(data_clean, x = "inout", y = "lowph",
          color = "inout", palette = "jco") +
  stat_compare_means(method = "wilcox.test")

Значение lowPH статистически значимо отличаются внутри группы inout. Так как, группа transported имеет значимо более низкие уровни pH, то и выживаемость у них будет ожидаться ниже

datacontinuous <- data_clean %>%
  select(-c(birth, year, exit)) %>%  
  select_if(is.numeric)
cormatrix <- cor(datacontinuous, use = "complete.obs")
print(cormatrix)
##              hospstay       lowph       pltct        bwt        gest
## hospstay  1.000000000 -0.09460363 -0.05993874 -0.2315169 -0.18461328
## lowph    -0.094603635  1.00000000  0.26643681  0.3261464  0.37926758
## pltct    -0.059938743  0.26643681  1.00000000  0.2598576  0.06545086
## bwt      -0.231516924  0.32614640  0.25985757  1.0000000  0.69134598
## gest     -0.184613279  0.37926758  0.06545086  0.6913460  1.00000000
## twn       0.005945527  0.03835193 -0.01407561  0.1614821  0.17101963
## apg1     -0.065378517  0.26799978  0.28021129  0.3309873  0.25568063
## vent      0.252473223 -0.58322801 -0.27313969 -0.3825846 -0.41200521
## pda       0.202599688 -0.22489191 -0.22166244 -0.2591969 -0.29283921
## cld       0.385734403 -0.30046333 -0.18031810 -0.4552955 -0.42163729
##                   twn        apg1        vent         pda         cld
## hospstay  0.005945527 -0.06537852  0.25247322  0.20259969  0.38573440
## lowph     0.038351928  0.26799978 -0.58322801 -0.22489191 -0.30046333
## pltct    -0.014075607  0.28021129 -0.27313969 -0.22166244 -0.18031810
## bwt       0.161482147  0.33098733 -0.38258456 -0.25919691 -0.45529548
## gest      0.171019629  0.25568063 -0.41200521 -0.29283921 -0.42163729
## twn       1.000000000  0.06570395 -0.03854605  0.01447667 -0.08853468
## apg1      0.065703952  1.00000000 -0.33681567 -0.19312965 -0.26967928
## vent     -0.038546054 -0.33681567  1.00000000  0.35471303  0.48398148
## pda       0.014476666 -0.19312965  0.35471303  1.00000000  0.40233337
## cld      -0.088534685 -0.26967928  0.48398148  0.40233337  1.00000000
corrplot(cormatrix, method = "circle", type = "upper", order = "hclust", 
         col = colorRampPalette(c("darkblue", "white", "darkred"))(200), 
         tl.col = "black", tl.srt = 45)

heatmap(cormatrix, 
        col = colorRampPalette(c("blue", "white", "red"))(200),
        scale = "none",  # не масштабировать данные
        margins = c(10, 10))

Иерархическая кластеризация

distmx <- as.dist(1 - cormatrix)
hclust <- hclust(distmx, method = "ward.D2")
plot(hclust, main = "Иерархическая кластеризация", 
     xlab = "Переменные", sub = "", cex = 0.8)

Тепловая карта и дендрограмма

pheatmap(cormatrix,
         color = colorRampPalette(c("darkblue", "ivory", "darkred"))(200),
         cluster_rows = hclust,  
         cluster_cols = hclust,  
         main = "Тепловая карта и дендрограммы")

PCA Анализ

sapply(datacontinuous, range) #разброс значений перемнных отличается значительно требуется шкалирование!
##      hospstay    lowph pltct  bwt gest twn apg1 vent pda cld
## [1,]     -295 6.529999    16  400   23   0    0    0   0   0
## [2,]      797 7.549999   571 1500   36   1    9    1   1   1
pca <- prcomp(datacontinuous, scale. = TRUE)
summary(pca)
## Importance of components:
##                           PC1    PC2    PC3     PC4     PC5     PC6    PC7
## Standard deviation     1.8711 1.0815 1.0553 0.92904 0.88809 0.86784 0.8331
## Proportion of Variance 0.3501 0.1170 0.1114 0.08631 0.07887 0.07532 0.0694
## Cumulative Proportion  0.3501 0.4671 0.5784 0.66475 0.74362 0.81893 0.8883
##                            PC8     PC9    PC10
## Standard deviation     0.70031 0.60398 0.51133
## Proportion of Variance 0.04904 0.03648 0.02615
## Cumulative Proportion  0.93738 0.97385 1.00000
fviz_eig(pca, addlabels = TRUE, ylim = c(0, 100))

Интерпретация - standard deviation показывает разброс данных вокруг каждой из компонент, где это значение наибольшее (в нашем случае PC1) та компонента лучше всего и объясняет различие данных.Proportion of variance тоже показывает сколько наших данных обьясняет компонента, как и кумулятивная пропорция. В нашем случае наиболее важная компонента - первая

Biplot

data_dead <- datacontinuous  
data_dead$dead <- data_clean$dead
pca <- prcomp(datacontinuous, scale. = TRUE)
fviz_pca_biplot(pca, 
                geom.ind = "point",  
                pointshape = 21,     
                pointsize = 3,       
                fill.ind = data_dead$dead,  
                col.var = "black",  
                gradient.cols = c("darkblue", "cyan", "darkred"),  
                repel = TRUE,        
                legend.title = "Dead")

transfer to plotly

interactive biplot

data_clean$id <- seq_len(nrow(data_clean))
dataid <- data_clean %>%
  select(-c(birth, year, exit)) %>%
  select_if(is.numeric)
dataid$id <- data_clean$id  
dataid$dead <- data_clean$dead 
pca <- prcomp(dataid %>% select(-c(id, dead)), scale. = TRUE)
pca_2 <- as.data.frame(pca$x)
pca_2$id <- dataid$id  
pca_2$dead <- dataid$dead
pca_var <- as.data.frame(pca$rotation)
pca_var$varnames <- rownames(pca_var)
fig <- plot_ly() %>%
  # Добавление точек для наблюдений
  add_trace(
    data = pca_2,
    x = ~PC1, y = ~PC2,
    type = "scatter",
    mode = "markers",
    text = ~paste("ID:", id, "Dead:", dead),  
    hoverinfo = "text",
    marker = list(
      size = 10,
      color = ~dead,  
      colorscale = "RdBu",
      showscale = TRUE
    )
  ) %>%
  
  add_trace(
    data = pca_var,
    x = c(rep(0, nrow(pca_var)), pca_var$PC1 * 5),  
    y = c(rep(0, nrow(pca_var)), pca_var$PC2 * 5),
    type = "scatter",
    mode = "lines+text",
    line = list(color = "black"),
    text = c(rep("", nrow(pca_var)), pca_var$varnames),  
    textposition = "top right",
    hoverinfo = "text"
  ) %>%
  layout(
    title = "PCA Biplot (Interactive)",
    xaxis = list(title = "PC1"),
    yaxis = list(title = "PC2"),
    showlegend = FALSE
  )


fig

Мы не выявили причинно-следственной связи между выживаемостью и распределением другим данных, нам все равно нужно проводить дополнительный анализ выживаемости, метод главных компонент поможет нам лишь отобрать те данные, которые с большей вероятностью предскажут dead статус. Dead переменная также принимает только два значения 0 и 1 (нет и да), а для PCA нам нужны непрерывные переменные

UMAP

pca <- prcomp(dataid %>% select(-c(id, dead)), scale. = TRUE)
pca_d <- as.data.frame(pca$x)
pca_d$id <- dataid$id
pca_d$dead <- dataid$dead


umap <- umap(dataid %>% select(-c(id, dead)))


umap_d <- as.data.frame(umap$layout)
umap_d$id <- dataid$id
umap_d$dead <- dataid$dead


pcaplot <- ggplot(pca_d, aes(x = PC1, y = PC2, color = as.factor(dead))) +
  geom_point() +
  labs(title = "PCA ", color = "Dead") +
  theme_minimal()


umapplot <- ggplot(umap_d, aes(x = V1, y = V2, color = as.factor(dead))) +
  geom_point() +
  labs(title = "UMAP ", color = "Dead") +
  theme_minimal()

library(gridExtra)
## 
## Attaching package: 'gridExtra'
## The following object is masked from 'package:dplyr':
## 
##     combine
grid.arrange(pcaplot, umapplot, ncol = 2)

UMAP change distance (я не поняла, нужно ли нам опять делать раскраску по переменной dead, сделала ее в прошлом примере навсякий случай, но дальше не буду)

umap_res_1 <- umap(dataid %>% select(-c(id, dead)), 
                   n_neighbors = 10, min_dist = 0.1)
umap_data_1 <- as.data.frame(umap_res_1$layout)
umap_plot_1 <- ggplot(umap_data_1, aes(x = V1, y = V2)) +
  geom_point(color = "pink") +
  labs(title = "UMAP") +
  theme_minimal()

umap_plot_1  

Результат - дата стала менее структурированной (нет четкого выделения кластеров, как в прошлых примерах). Я считаю, что это связано с тем что я уменьшила дистанцию и соседей и алгоритм теперь основывается на локальных связях между точками и старается их группировать компактно между собой, при этом мы упускаем глобальную структуру данных

Permutation task

data_clean$bwt_50 <- data_clean$bwt
num_rows <- nrow(data_clean)
num_permuted <- round(num_rows * 0.5)
perm_indices <- sample(1:num_rows, num_permuted)
data_clean$bwt_50[perm_indices] <- sample(data_clean$bwt_50[perm_indices])
data_clean$bwt_100 <- sample(data_clean$bwt)
perform_pca <- function(data, column_name) {
  data_numeric <- data %>% select(-c(birth, year, exit, column_name)) %>% select_if(is.numeric)
  pca <- prcomp(data_numeric, scale. = TRUE)
  pca_result <- summary(pca)
  return(pca_result)
}


perform_umap <- function(data, column_name) {
  data_numeric <- data %>% select(-c(birth, year, exit, column_name)) %>% select_if(is.numeric)
  umap_model <- umap(data_numeric)
  return(umap_model$layout)
}
pca_original <- perform_pca(data_clean, 'bwt')
## Warning: Using an external vector in selections was deprecated in tidyselect 1.1.0.
## ℹ Please use `all_of()` or `any_of()` instead.
##   # Was:
##   data %>% select(column_name)
## 
##   # Now:
##   data %>% select(all_of(column_name))
## 
## See <https://tidyselect.r-lib.org/reference/faq-external-vector.html>.
## This warning is displayed once every 8 hours.
## Call `lifecycle::last_lifecycle_warnings()` to see where this warning was
## generated.
pca_original
## Importance of components:
##                           PC1    PC2     PC3    PC4     PC5    PC6     PC7
## Standard deviation     1.7859 1.1299 1.08060 1.0206 0.97193 0.9315 0.91101
## Proportion of Variance 0.2658 0.1064 0.09731 0.0868 0.07872 0.0723 0.06916
## Cumulative Proportion  0.2658 0.3722 0.46948 0.5563 0.63500 0.7073 0.77646
##                            PC8     PC9    PC10    PC11    PC12
## Standard deviation     0.84315 0.81449 0.69931 0.68132 0.59573
## Proportion of Variance 0.05924 0.05528 0.04075 0.03868 0.02957
## Cumulative Proportion  0.83571 0.89099 0.93174 0.97043 1.00000
umap_original <- perform_umap(data_clean, 'bwt')
umap_original
##            [,1]         [,2]
## 2    0.08134178 -1.966536179
## 4    1.93980803 -0.046309478
## 5   -0.78792197  3.947475861
## 7    2.84173343  1.100311245
## 10  -1.09816622  4.087933307
## 11   1.75893969  2.135278796
## 13   1.57316124  2.486712557
## 14  -0.71059838  4.110642262
## 15  -3.60873091 -2.302998087
## 16  -1.19219162  4.038703908
## 17   0.32280846  0.845107422
## 19   1.70882817  2.200318458
## 20   2.65620504  1.486608213
## 21  -3.10636731 -3.018667999
## 22   1.55525149  2.323932122
## 23   0.88482424  0.167100610
## 25   1.57228777  0.302639466
## 27  -1.09352000  3.911413993
## 28  -0.26872983  3.968739879
## 29  -3.17837834 -2.729470424
## 30   0.41320223 -1.526142809
## 31   0.14257462  4.012757768
## 32  -0.68084561  3.971331880
## 35   2.28234739  0.479797051
## 36  -3.78949781 -2.113417138
## 40  -0.71464294  3.984270457
## 41   0.15746315 -2.033397980
## 42   1.08758300  0.230774209
## 43   2.72694568  1.424104685
## 45  -3.41858695 -2.462539209
## 46   0.42461445  1.586874795
## 47  -0.46943981 -2.935400251
## 48   1.94437643 -0.084729197
## 50  -2.92595518 -2.787818795
## 51   1.48296831  0.406200707
## 53   0.47061231  0.374515407
## 54  -0.13828922  4.021913591
## 55   1.63459369  0.323319418
## 56   1.73329296  2.195746910
## 57   0.27673771  3.283292737
## 58   0.32449883 -1.860750735
## 59   0.94668629  0.902173757
## 62  -2.82316179 -2.906885404
## 65   0.06531802  3.761128526
## 66   1.62121114  2.261116786
## 67   0.01352182  3.901739048
## 68   0.79991427  0.371959971
## 69  -2.42020772 -2.957471313
## 70  -3.04719138 -3.067416593
## 72   0.18423962 -2.104755555
## 74   2.87172523  0.867179349
## 75   1.41398297  0.546055413
## 76  -1.18302060  3.974698727
## 77  -3.84034400 -2.093087420
## 78   0.55232887  1.955211828
## 80   1.47378103  2.098831438
## 81   2.68453363  0.915036406
## 82   0.09394661  3.239266313
## 83   2.28591904  0.693755399
## 84  -3.14563055 -2.562646268
## 85   0.21652240 -1.042085676
## 86   1.79427149  0.051520783
## 87   1.46887629  2.074180288
## 88  -3.80455403 -2.187913595
## 91   0.08243764 -2.135658848
## 92   0.16051648 -1.623706740
## 94   2.00887581  0.921777512
## 95  -3.01247806 -2.973014705
## 97  -1.08466037  4.007441442
## 98   0.88892340  0.162568054
## 99   2.65771953  1.433147195
## 101  0.93271430  0.828806078
## 102 -2.49786199 -2.961685832
## 103 -2.83125886 -2.863778054
## 104  2.94389638  1.157423487
## 105  2.19680980  0.059766690
## 107  1.52868523  2.338231628
## 108  0.06012182  3.894425318
## 109  1.33025439  0.945850866
## 111  0.28836703  3.290411211
## 114 -3.76393922 -1.942868238
## 115  0.58694776 -1.819891165
## 116 -0.03166899 -2.176174008
## 117 -0.62417555  4.023413212
## 118  1.70200579  0.578433194
## 119  0.63005660  1.075042399
## 120 -2.57483227 -2.865564572
## 121  0.22800217  0.575304602
## 122  0.50535111 -1.961687193
## 124  1.66298763  0.026527564
## 125 -3.15413865 -2.520265257
## 126  0.24762507  3.536646053
## 127  1.02239188  0.697180842
## 128  1.08599307  2.482018173
## 129  2.01309896  0.482226309
## 130 -2.96123173 -3.106520583
## 131 -1.26158119  3.991629569
## 132  0.08279661  0.467670260
## 133 -3.79472654 -2.158355602
## 134  0.75034081  1.267357908
## 137  2.01317935  0.340036538
## 139 -0.77063869  4.170797265
## 140 -0.11048696  3.999906727
## 141  0.29474333  0.384249768
## 143  0.37290667 -1.886177857
## 144  0.17598967 -2.326686368
## 145 -0.76101578  3.860048653
## 146 -3.10183897 -3.029863955
## 148  0.01181231  3.809615676
## 149 -0.41581837  1.427431468
## 150  0.59985434  2.101960641
## 151  0.47645286 -1.718167529
## 152  1.43773100 -0.141800979
## 153 -0.42585575 -0.332970605
## 154 -0.50343170  4.114776142
## 155  2.18652144  0.300169643
## 156  1.03907643  2.446005103
## 157  0.03447071  0.121985299
## 159  2.61197734  1.105051515
## 160 -0.26152948 -0.268353298
## 161 -0.03924953  1.660450399
## 162 -0.96707176  4.102712260
## 163 -0.39902096  1.283701448
## 164  1.10896048  2.627802307
## 165  1.91244738  1.902428909
## 166 -2.65044913 -2.426899694
## 167 -3.09845365 -2.682515390
## 168  1.96011265  0.314512418
## 169  3.26732263  1.135490520
## 170 -0.57131011 -0.381247347
## 172 -0.96654489  3.450760201
## 173  0.07899598  0.411514377
## 174 -0.16228067  3.825892977
## 176 -3.86878010 -2.031669494
## 177  1.76706067  2.051492759
## 179 -0.05615475 -0.575720151
## 180 -2.96119210 -2.677424145
## 182 -3.17670336 -2.587728404
## 183 -3.87508615 -2.056525275
## 184  0.01077409  0.578187462
## 185 -0.99508493  3.351106270
## 186  1.25780530  0.821003071
## 187 -0.43476370  3.773657577
## 188  2.06317325 -0.171808838
## 189  1.26543518  2.560885405
## 190  0.06288651 -2.542704946
## 191  1.84829939 -0.244464058
## 192 -0.58921890  4.225905860
## 193 -2.75430013  3.210909523
## 194 -3.70196031 -1.411678401
## 195 -3.78600417 -1.313642638
## 196  1.04465831 -0.195007742
## 197 -0.68350110  3.611756360
## 198  0.83433612  1.569518555
## 199 -0.44250362 -0.342339245
## 201  2.96477340  0.772056096
## 202  0.80276249  0.749031435
## 203  2.30325659  0.067705374
## 205  0.13270290 -2.287905011
## 206 -3.56161725 -1.165593438
## 207  3.11396102  0.626081313
## 208  0.96732452  2.436624900
## 210 -0.26555014 -1.558263245
## 211 -0.40917459 -0.278290290
## 212  0.56170798 -1.976070611
## 213 -3.83906505 -1.731139974
## 215 -1.14484624  4.027624434
## 216 -0.77901549  1.695437867
## 217 -3.59071331 -1.084080526
## 218  1.41873855  2.587566946
## 219 -3.25657393 -2.158231066
## 220  3.28550230  1.119883918
## 221 -0.15888866  3.843407794
## 222 -4.01914130 -1.033267608
## 223  0.99118717  2.080085683
## 224  1.44768013 -0.233876187
## 225  2.46096639 -0.164702209
## 226 -0.29834984  4.261205006
## 227 -3.30607824 -2.109988300
## 228  0.02399707 -0.593885929
## 229  0.22801516  2.259182087
## 230 -0.19154870 -0.268012225
## 231  3.09582120  0.728186542
## 232  0.15901489  2.943611486
## 233  2.40963745 -0.522124149
## 234 -1.27072299  3.573647077
## 235  1.20011108  1.653242233
## 236 -0.78682646  3.385136692
## 237  1.13387493  2.555361435
## 238 -3.90134692 -0.773214169
## 239 -0.44239898  4.261278507
## 240 -3.61079038 -1.522546299
## 241 -0.04068378  3.830396982
## 242  0.18007446 -0.185387004
## 243 -2.86701811 -2.131331553
## 244 -0.53214940 -3.022928144
## 245 -2.75627962  3.143698081
## 246  3.05748450 -0.089909086
## 247 -4.02002101 -0.626347048
## 248  0.22530942  2.293752796
## 249 -3.63725525 -1.308197550
## 250  2.93800245 -0.197594274
## 251 -0.79083679  1.816834013
## 253 -0.29452061 -2.918630289
## 255  0.18313139  2.900207619
## 256  0.57831938 -2.461227009
## 257  0.71108120 -2.534601666
## 259  0.40500501  2.660464115
## 260  0.96010353  1.250674785
## 261 -0.41730341 -1.579766857
## 262  3.75947388  0.920294201
## 263  0.19972147 -0.064427028
## 264 -0.14553735 -2.412595769
## 265  2.61433007 -0.649433550
## 267  0.64277040  2.659787974
## 268  0.14561195 -0.761905074
## 269 -0.06203613 -2.447910621
## 270 -3.59865967 -1.541091472
## 271 -3.05172394 -1.908558178
## 272  0.78815131  2.243347859
## 273  0.45234456 -0.359625011
## 274 -0.33628805 -1.451679170
## 275 -2.75988070  3.124992826
## 276  1.42055805 -0.883807938
## 277 -0.43548479  4.318433878
## 278 -0.10346010 -2.068665022
## 279 -3.94166401 -0.499040693
## 280  3.86916729  0.865111537
## 281  1.21428106 -0.709996611
## 282  1.10186573 -0.877664586
## 284  0.70550581  1.550334577
## 285 -2.37884440  2.987602269
## 286  0.20648168 -2.876566569
## 287 -0.64993509  1.831932187
## 288  0.93942215  1.752714658
## 289  3.48336548  0.832972495
## 290  0.11540613  2.246767008
## 292 -2.44685987 -2.187189980
## 295  0.47686422  2.175087734
## 296  3.38154968  0.319089637
## 297  3.64005063  1.197729145
## 298 -2.86759234 -1.997168778
## 299  1.49643612 -1.137607836
## 300 -3.91608698 -1.135481104
## 301  2.71433381 -0.822339700
## 302  3.89813142  0.915477790
## 303 -0.13344524 -3.049044461
## 304  1.31393568 -0.801530112
## 306  3.78767258  1.104746745
## 307 -0.31060894 -3.024311608
## 308 -3.85233137 -0.557253223
## 309 -2.22826687 -2.309659882
## 310  0.47891712 -2.690436230
## 314 -3.11964059 -1.922046133
## 315 -0.37734495 -1.315880675
## 316 -2.55152805 -1.869165547
## 318  0.63508136  2.257643328
## 319 -0.27182241 -3.027509782
## 320  3.92808778  0.978856788
## 321 -0.94276489  1.560604309
## 322 -3.48615077 -1.113219659
## 323  0.21470152  2.179905484
## 325  0.29507155  2.640655822
## 326  0.90262220 -0.916051825
## 328  3.22027880 -0.444186353
## 329  1.20872202 -1.401059965
## 330  0.97806196  1.327346326
## 331 -2.49149505  2.938288869
## 332 -2.45528827 -2.634801677
## 333  0.12945189  2.485561657
## 334 -0.91188659 -2.967088182
## 335 -0.28456267  2.382929893
## 336  0.24773587 -3.015683899
## 337  3.66942322  1.287347670
## 340  0.88112429 -2.570057477
## 341 -0.35996003  2.392887877
## 342  3.41225410  1.567007642
## 343  3.50128896  1.463335601
## 344  3.27137160 -0.522166685
## 345 -0.76557596  1.701009528
## 346  1.04283142 -2.704090963
## 347 -3.73717444  0.118758531
## 348 -3.88165192 -1.047298124
## 350 -3.96750337 -0.863837039
## 352 -4.00403261 -0.273994078
## 353 -2.00289517 -1.117784183
## 354  3.14903612 -0.415757840
## 355  2.79468566 -0.891201012
## 356  3.87409211  1.041982739
## 357 -2.80720497  2.983144443
## 358 -2.46070397  2.845003713
## 360 -3.03066419 -1.844273412
## 361  0.60690926 -1.548135058
## 362  3.47378634 -0.291442984
## 363 -4.07421544 -0.380547721
## 364  0.90886168 -2.612957254
## 365  1.50204232 -2.013980452
## 366  3.45422597 -0.415565333
## 367  3.94823124  0.905946889
## 368 -1.84306361 -2.339428917
## 369 -0.68922120  1.584585731
## 370 -2.65526509  2.870200960
## 371 -1.82908271 -1.672827284
## 372 -3.95727208 -0.833136396
## 373 -2.34073209  2.887545308
## 374  3.30669321 -0.637825691
## 375  1.28343096 -2.208694070
## 376  4.05179713  0.377875551
## 377  1.75165441 -1.399332788
## 378  3.02824928 -0.870824124
## 379 -0.86079485  1.891349234
## 380 -3.77341118  0.097125001
## 381  4.09612628  0.314800588
## 382 -1.71824867 -1.984590550
## 384  0.76543923 -1.357288608
## 385  0.90042872 -1.125699338
## 386 -3.56281913 -0.005223793
## 387 -1.01586455  2.118630942
## 388 -0.53928232 -1.630075960
## 389  3.10695163 -0.816631079
## 390 -2.07074769  2.359095227
## 392 -2.74679956 -1.886903846
## 394  2.72548807 -1.101668657
## 395  2.94845895 -0.877837317
## 396 -1.69621987  2.606734709
## 397 -1.67957919 -2.048100325
## 398 -3.46948748  0.624251419
## 400  4.15348381  0.326449231
## 401 -2.26235819  2.658711973
## 402 -0.59788065 -3.179708382
## 403 -2.54858134  2.722889471
## 404  2.02343492 -1.447472010
## 405 -4.14799832 -0.489077813
## 406 -2.08132140 -2.549565422
## 407 -1.48883753 -2.521483956
## 408 -0.84207117 -1.597132033
## 409  0.99273526 -1.557946089
## 410  1.65066774 -1.496661856
## 414  2.74513569 -1.089715689
## 415 -3.83620191  0.273415159
## 416  0.07994578 -3.252093056
## 417 -3.07445474  2.176276070
## 418 -3.84727725  0.227990301
## 419 -1.27879081  2.392870297
## 420  1.03464012 -1.251242808
## 421 -2.25899958 -1.785254982
## 422 -0.57441407 -1.730590114
## 423  2.10795919 -1.703873418
## 424  4.13012139  0.759774400
## 425 -2.51745717 -1.832917972
## 427 -1.95057302  2.607421293
## 428  4.45266298 -0.280692680
## 429 -1.34512284  2.506501038
## 430 -3.57801351 -0.015250679
## 431  4.45090774 -0.415048975
## 432 -2.34409409  2.680851365
## 433 -2.33488868 -0.707538151
## 434  3.37938395 -0.643833326
## 436 -3.86707861 -0.554506147
## 437  1.65026000 -2.277246615
## 438  4.46322311 -0.403818120
## 439  1.97219832 -1.686029466
## 440 -2.60949796 -1.760126752
## 441  0.15905169 -3.428050017
## 442 -1.74231558  2.573389572
## 443  1.10839845 -1.712019267
## 444 -1.11856784 -2.810516439
## 445  4.30303512  0.207893479
## 446  4.77584792  0.563219257
## 449 -1.81460922  1.906355419
## 450  3.26298789 -0.966843292
## 451 -2.77523341  2.575193077
## 452 -1.23145799  2.372023570
## 453  3.62474363 -0.450577424
## 454 -1.44621401  2.483424156
## 455  4.93880077  0.354882641
## 457  3.57303423 -0.591841624
## 458 -2.39572967  2.312615122
## 459  4.52900801 -0.431795140
## 460 -3.37231790  0.135095806
## 461 -2.23180959  2.168385971
## 462 -1.22524124  2.347764153
## 463 -1.22090701  2.139066895
## 464  3.54872544 -0.418419786
## 465 -1.49788372  2.491431781
## 466 -0.06574729 -3.361808651
## 467 -1.32470166 -2.659824967
## 468  4.40906308 -0.347773245
## 469 -1.25032334  2.564383643
## 470 -2.20784689 -0.888054540
## 471 -0.27193251 -3.431796603
## 472 -0.73944698 -1.878525188
## 474  4.16286464  0.142645239
## 475  3.46430845 -0.806125837
## 476  1.09860318 -1.325430790
## 477  0.91542553 -3.174645658
## 478 -1.72386549 -1.326380608
## 479  4.37519590  0.252939186
## 480  4.26102096  0.447586904
## 484 -1.94423072 -1.041546534
## 485 -1.19872178 -1.580901316
## 486  0.73821488 -3.405818765
## 488  2.14313114 -1.965869035
## 490  3.57795942 -0.637533109
## 491  3.55188625 -0.626762060
## 492  2.08413870 -2.165149424
## 493 -1.80425040 -2.225622091
## 494  1.15233543 -3.118107619
## 495 -3.31044791  0.211042807
## 497 -1.16132805  2.334206926
## 498 -2.47062271 -0.061043230
## 499 -1.47299956  1.899363276
## 500 -1.42700848 -2.398018050
## 501 -2.30302648  1.634601074
## 502 -2.68919151  2.399199666
## 503  3.43570587 -1.115676950
## 504  4.58088536  0.288635176
## 505  4.55053223 -0.438908837
## 507 -2.81448390  2.471310506
## 508 -3.55588691 -0.888557710
## 509  4.60845843 -0.550306572
## 511 -3.03598856  0.431228369
## 512 -1.96672381  1.779271859
## 513  2.31201535 -1.963426400
## 514  4.66931022 -0.570203244
## 515 -2.93969935 -1.675717673
## 516  4.60593441 -0.504951885
## 517  2.35930807 -1.986610224
## 518 -3.61114954  0.024864564
## 519  0.96472475 -3.086793959
## 522 -0.80335690 -2.011685984
## 523 -2.24652891 -0.765776133
## 524 -1.33831802  2.490106197
## 525 -2.79179971  0.045713199
## 526  4.02692424 -0.528110091
## 527  1.99429024 -2.388005694
## 528 -3.39093493  1.887372593
## 529  0.49957990 -3.561123998
## 530  2.29587419 -2.039459475
## 531 -2.41476008 -2.148695567
## 532 -1.45358472  2.671285875
## 533 -3.54804961  0.258782447
## 534  0.02576622 -3.387731077
## 535  1.90588624 -2.498836713
## 536 -1.13042066 -1.853586636
## 537  4.20927048 -0.291853688
## 538 -1.77555476 -2.440347555
## 539  3.96927089 -0.683803976
## 541 -1.36394235 -2.404375174
## 542 -1.29293095 -1.937613980
## 543  4.24586536 -0.660464385
## 545 -1.43572720 -2.457812831
## 546  0.95029364 -3.289551063
## 547  4.70593708 -0.537493368
## 548 -2.07546083  1.732019652
## 550 -3.00372072  1.902586920
## 551 -0.83589815 -2.041655919
## 555 -3.41578379  1.981674985
## 558  4.93541645  0.144845495
## 560 -2.32702784  2.204537372
## 561 -1.26973087 -1.792362196
## 563 -2.51412114  2.121752385
## 564 -3.62779765  0.112239069
## 566 -2.95074497  0.177557300
## 568 -3.06747936 -1.574271963
## 569 -2.13578834  1.988738604
## 571  2.35968792 -2.146219094
## 572  0.40762094 -3.645100781
## 573  2.13502045 -2.299632881
## 574  4.00951475 -0.898929518
## 575  2.18482150 -2.298902787
## 578  2.56513264 -1.943286128
## 579  4.77298879 -0.429573300
## 580  0.22066164 -3.612460939
## 581 -2.15415658  1.596906864
## 583 -2.29648459 -0.681985503
## 584 -2.62321531 -1.803706903
## 585  1.15201940 -3.217085684
## 586  5.02064781  0.330544548
## 587  5.05296402  0.065315758
## 588 -1.90912393 -2.579058609
## 590  0.13046222 -3.610176549
## 591 -2.72391575  2.373421361
## 592  2.46529126 -2.103754823
## 593 -2.42508833  2.266182819
## 594 -2.29058201  1.992346460
## 597 -1.96244379  0.928523158
## 599  0.98977677 -3.276426300
## 600 -3.61093400  0.035284204
## 601  5.11472020  0.244957426
## 602 -3.04766609  2.295061260
## 603 -2.13450850 -0.886130536
## 604  0.16377203 -3.644248958
## 605 -2.21017898  1.290865629
## 606  4.81901080 -0.373999474
## 608  2.74292804 -1.946104459
## 609  3.06827893 -1.796444538
## 610 -2.54996641  1.194117464
## 611 -1.37153883 -1.620737156
## 613 -2.51214025  1.441895091
## 615 -2.20041217  0.982255846
## 616  2.79199068 -1.988067226
## 619 -3.53728141  1.379802050
## 620 -3.50849956  0.236791919
## 622 -0.15175376 -3.602075411
## 623  1.65864009 -2.779756410
## 624 -0.91525405 -2.084320105
## 625  5.16456607  0.196806366
## 626  4.75937375 -0.114509800
## 628 -1.91975514  1.394647932
## 629  4.60005479  0.148073777
## 630 -1.17821953 -1.987595769
## 631  5.06591394  0.174524989
## 632 -2.67649195  0.156343641
## 634 -2.34735859  0.683023948
## 636 -1.55236716 -2.256721872
## 638 -3.34472374  1.933952319
## 641  4.76384363 -0.258736530
## 642  0.98997365 -3.262253346
## 643 -3.13512659  2.287265696
## 647 -3.67013157  0.776133282
## 648  4.16916100 -0.810442276
## 649 -1.30030611 -1.592817346
## 650  2.42829186 -2.079432257
## 652 -3.36543299  1.954875326
## 661  0.45898871 -3.624186933
## 662 -0.18321270 -3.536328869
## 664 -2.06415972  1.054689436
## 666  5.12052879  0.141230610
## 667 -2.95207029  0.003462019
## 671 -1.87076897 -1.144009841
pca_50 <- perform_pca(data_clean, 'bwt_50')
pca_50
## Importance of components:
##                          PC1    PC2     PC3     PC4     PC5     PC6     PC7
## Standard deviation     1.872 1.1180 1.08045 1.03080 0.97266 0.91613 0.87923
## Proportion of Variance 0.292 0.1042 0.09728 0.08855 0.07884 0.06994 0.06442
## Cumulative Proportion  0.292 0.3962 0.49346 0.58200 0.66084 0.73078 0.79520
##                            PC8    PC9    PC10    PC11    PC12
## Standard deviation     0.83167 0.8154 0.69811 0.59576 0.50871
## Proportion of Variance 0.05764 0.0554 0.04061 0.02958 0.02157
## Cumulative Proportion  0.85284 0.9082 0.94886 0.97843 1.00000
umap_50 <- perform_umap(data_clean, 'bwt_50')
umap_50
##             [,1]         [,2]
## 2   -2.805938202 -4.142778707
## 4   -1.659734472  1.843844665
## 5    1.651896028  2.980084361
## 7   -0.865696963  3.598541511
## 10  -1.474080734  2.997435858
## 11  -1.172261043  3.408604910
## 13   0.402465355  3.372756309
## 14  -0.275216531  3.770191186
## 15   2.087477431 -2.024186979
## 16   2.324783927  1.590940910
## 17  -1.697844899  1.796736535
## 19  -1.334591829  3.334948627
## 20  -1.159795953  3.507331337
## 21   1.969863662 -2.293906765
## 22   0.316800868  3.339552276
## 23   2.718916658  1.144829613
## 25  -0.345329321  2.316177128
## 27   2.234690802  1.682644255
## 28   1.838435933  2.733504612
## 29  -2.577656852 -4.422138464
## 30   1.221999817 -1.581800069
## 31   1.742411745  3.215351921
## 32   1.826787028  2.731842378
## 35  -1.588236489  2.464588774
## 36  -2.873986835 -4.142412157
## 40   2.087596848  1.966540846
## 41  -2.834367268 -4.245508804
## 42  -1.109901186  1.858200160
## 43  -1.199322054  3.538077448
## 45   2.386089353 -2.420855177
## 46  -0.069705466  2.528045225
## 47  -2.175416854 -4.469870164
## 48  -1.692575581  1.730015852
## 50   2.669272369 -2.499140629
## 51  -1.585706595  1.949878307
## 53  -0.926664821  1.679694954
## 54   1.857899087  3.076089488
## 55   2.240399349  1.322876638
## 56  -1.490112374  3.496282748
## 57   1.221906735  3.068318638
## 58  -2.910578870 -4.125897565
## 59  -0.576643959  2.389942832
## 62  -2.573042373 -4.396853675
## 65   1.471552305  3.178802854
## 66   1.519447052  3.084232455
## 67   1.945670291  2.614861845
## 68  -1.152230492  1.870442601
## 69  -2.502134460 -4.255889384
## 70   1.924935434 -2.272996532
## 72  -2.953665534 -4.209753494
## 74  -2.841543175  2.572818881
## 75  -1.044015997  2.211991481
## 76  -0.301479360  2.374316564
## 77   2.930576022 -1.726766901
## 78   2.023568178  2.443847940
## 80  -1.445633111  3.150523537
## 81  -1.567114406  3.203977889
## 82   2.111757359  1.575873080
## 83  -0.852748063  2.651762071
## 84   2.929206999 -2.367507817
## 85   0.317453105 -1.847615616
## 86  -1.404280613  1.828975553
## 87   0.001821905  3.032951461
## 88   3.095806919 -1.862155564
## 91   1.832226936 -2.304528466
## 92  -2.519012589 -3.780596541
## 94   1.512120683  2.846206840
## 95  -2.639559490 -4.418329335
## 97  -1.467399069  2.763777447
## 98  -1.715433624  1.782893200
## 99  -0.162496814  3.351465942
## 101  2.189737144  1.461414737
## 102 -2.593618515 -4.335959037
## 103  3.055009714 -2.126097548
## 104 -1.425241686  3.411834852
## 105 -1.647535932  2.009206606
## 107 -0.110607108  3.621017196
## 108 -1.523092139  3.452969616
## 109 -1.657979728  2.580864776
## 111  0.138821254  3.022543052
## 114  2.709224560 -1.519325574
## 115 -2.977076906 -3.734050178
## 116 -2.554252869 -4.096930812
## 117  1.872289194  2.915901618
## 118 -1.271978939  2.431154514
## 119 -0.443275900  2.513022765
## 120 -2.382750843 -4.169651208
## 121  0.925076168 -1.108519113
## 122 -2.941286377 -3.850215018
## 124 -1.537714737  1.861314523
## 125  2.625789364 -2.417337915
## 126  1.414218046  3.153878889
## 127 -1.596711452  2.091771482
## 128 -0.078191569  3.622364303
## 129 -0.624745960  2.418199352
## 130  1.956086905 -2.391810837
## 131  2.555005076  1.563559542
## 132  1.117828369 -1.373971235
## 133  3.047176651 -1.970349401
## 134 -0.377301594  2.599914885
## 137 -0.222275976  2.497123672
## 139 -1.135147944  3.573716649
## 140  1.821514791  3.013928794
## 141  2.534615988  1.187560038
## 143 -2.894074991 -4.254522809
## 144 -2.621313168 -4.411069352
## 145  2.847499452  1.739394806
## 146  2.046410592 -2.466700398
## 148  1.728275935  3.077465640
## 149 -1.839456747  1.758860227
## 150  1.388691693  2.818959999
## 151  2.840003065 -1.105679112
## 152 -1.256403722  1.695297889
## 153  1.384010458 -1.807925300
## 154 -0.567901515  3.333262590
## 155 -1.683981421  2.170271646
## 156 -0.084168051  3.730973655
## 157  0.675593715 -1.516664418
## 159 -0.389857301  3.846073026
## 160  1.532240566 -1.748163022
## 161  0.990631971  2.502488779
## 162  1.734703919  3.128867988
## 163  1.150110382 -1.108867508
## 164  0.556938129  3.232297457
## 165 -0.217972850  3.716048316
## 166  2.449658771 -2.525493740
## 167  2.165680994 -2.456038951
## 168 -1.746648586  2.144653501
## 169 -0.948765232  3.492176149
## 170  1.615072299 -1.885781219
## 172  2.142457590  1.361398665
## 173  0.182978210 -1.491291206
## 174  0.680570130  2.853965284
## 176  2.317281880 -2.667223843
## 177 -0.256395819  3.736990795
## 179  0.410238345 -1.840666383
## 180  2.960000060 -2.438014275
## 182  2.398068500 -2.546087765
## 183  3.133218528 -1.846836360
## 184  0.290486654 -1.535094679
## 185 -0.657275222  2.498527684
## 186 -1.029843277  2.516981855
## 187  0.907892165  2.562621122
## 188  0.711343245 -1.433338274
## 189  3.029491275  2.163763628
## 190 -2.396168454 -4.460254268
## 191  0.930075077 -1.268506104
## 192  2.322644306  2.670308526
## 193 -1.416716121  3.422899357
## 194  2.913813725 -1.340877962
## 195  2.856890796 -1.247516028
## 196  0.084734689 -1.246624798
## 197 -1.906233991  2.586247370
## 198 -2.198082133  2.546914035
## 199  1.524195559 -1.878160084
## 201 -2.382295205  2.672591800
## 202 -1.790963458  2.107243255
## 203  2.396881902  1.209441479
## 205 -2.296043319 -3.737330134
## 206  2.527516130 -0.767944493
## 207 -1.767907741  2.795051171
## 208 -0.133253175  3.721852230
## 210 -1.854878628 -3.218903746
## 211  1.450108577 -1.783589605
## 212 -2.697713368 -3.581703638
## 213  3.232225865 -1.693841307
## 215  0.636050598  2.688415434
## 216  0.475678874 -1.460191440
## 217  2.720915758 -0.792538005
## 218  2.493990799  2.835527935
## 219 -1.976599991 -4.394459888
## 220  0.648127937  2.977374608
## 221  0.365868964  2.944465361
## 222 -2.430943886 -4.595236636
## 223  0.291732881  2.976366335
## 224  2.713341236  1.428883343
## 225 -2.190373366  2.019002823
## 226  2.428765440  2.850114837
## 227  2.695610560 -2.396950660
## 228  0.132081423 -1.673809032
## 229  0.887507167  2.436517937
## 230 -3.030021765 -3.780877937
## 231 -2.842899260  2.344936199
## 232 -2.336894584  2.620353841
## 233 -2.123075114  1.672787455
## 234  2.578494780  1.042553198
## 235 -2.074769368  2.781808391
## 236  1.011590178  2.238622982
## 237  0.374735491  2.999330909
## 238  3.286333604 -0.765852946
## 239  2.569071499  2.854040551
## 240  3.508130677 -1.005946819
## 241  2.071341400  2.888701052
## 242  0.350197682 -1.488826155
## 243 -2.076275110 -3.967707756
## 244  2.821716834 -2.565808464
## 245  3.123207976  1.664446120
## 246 -2.735417881  2.438349905
## 247  3.438944855 -0.717589316
## 248  0.931020174  2.299798194
## 249  2.748924585 -0.907285137
## 250 -2.407342690  2.378591387
## 251  1.895283068  1.023391523
## 253 -1.950513684 -4.381537329
## 255 -2.384156280  2.705647783
## 256 -2.437295401 -3.722931838
## 257 -2.503372582 -4.624623482
## 259 -3.340221594  2.378323491
## 260 -2.366276088  1.984588519
## 261  3.143224861 -1.489722642
## 262 -3.382066339  2.348610174
## 263  0.544187477 -1.416406044
## 264 -2.064744375 -3.785696383
## 265 -2.116098493  1.934225505
## 267 -2.962866886  2.314472179
## 268 -0.333749009 -1.744490206
## 269 -2.142094770 -3.885853140
## 270  3.552246411 -1.139723264
## 271 -1.621765330 -3.280203730
## 272  0.686001375  2.794875578
## 273  0.091490953 -1.356360189
## 274 -0.971697019 -2.385630275
## 275 -2.587424464  2.346426273
## 276  2.657642162 -0.613126065
## 277  2.616594704  2.724949508
## 278 -1.942907743 -3.473671924
## 279  3.302500780 -0.464837511
## 280  0.252843887  2.986590679
## 281 -1.715200374  1.056765838
## 282 -0.262960851 -1.256470477
## 284 -2.457998964  2.260386788
## 285  0.424686798  2.737887950
## 286 -2.052617005 -4.191834968
## 287  1.372690638  1.668724056
## 288 -2.707456849  2.314954908
## 289 -2.592340345  2.603777865
## 290  0.779632965  2.274314097
## 292 -1.783464139 -3.529445590
## 295  0.682708521  2.085255782
## 296  1.400601249  1.966618490
## 297  2.058788467  2.610155857
## 298  3.300218459 -2.517216547
## 299 -0.822610756 -1.659237305
## 300 -1.959672510 -4.541530045
## 301  1.310966469  1.843814496
## 302 -3.386728404  2.305360668
## 303 -1.899787093 -4.466789666
## 304  2.185039575  0.746206381
## 306 -3.455346278  2.335899926
## 307 -1.740803973 -4.319154772
## 308  3.377602902 -0.756883013
## 309 -1.714922950 -3.506265859
## 310  1.759284335 -1.852097739
## 314  3.505031057 -2.291957567
## 315 -0.964378994 -2.414777330
## 316 -2.144864253 -3.932564554
## 318 -3.264336953  2.276034889
## 319 -1.784810873 -4.356710995
## 320 -3.466461812  2.315599257
## 321  0.251763210 -1.420100680
## 322  2.653925233 -0.603413214
## 323  1.162090174  1.931187768
## 325 -3.518933987  2.267861980
## 326 -0.202896374 -1.296930255
## 328  1.948376233  0.922809003
## 329 -1.035623797 -1.728565298
## 330 -0.509039451 -0.705988449
## 331  2.698036769  2.438873180
## 332  3.064071733 -2.545345674
## 333  0.600336447  1.957717224
## 334  2.982087019 -2.619285047
## 335  1.114183923  1.953139117
## 336 -1.977132058 -4.535714625
## 337 -3.286739967  1.981685032
## 340 -0.910948775 -2.365349934
## 341 -1.956632803  2.539087788
## 342  2.879767339  2.599088623
## 343  3.059688906  2.281913740
## 344 -2.549151829  2.139364094
## 345 -2.936609552 -0.388734712
## 346 -2.777244094 -0.883545002
## 347 -0.619149776 -1.478657311
## 348 -1.757947292 -3.404772655
## 350  3.671770486 -0.897311622
## 352  3.664476634 -1.073182855
## 353  1.270101751 -1.610763330
## 354  3.217020502  0.366889386
## 355 -0.463081036 -1.116486688
## 356  1.933411211  2.329122918
## 357  0.613126706  1.902249995
## 358  1.302965011  1.891350311
## 360  3.530053731 -2.271877575
## 361 -0.924515372 -2.126403596
## 362 -2.935132731  1.818688949
## 363  3.622112910 -1.081404661
## 364  2.595574203 -0.483864766
## 365 -2.440454287 -0.981226602
## 366 -3.119768516  0.514895197
## 367 -3.578323184  2.056226626
## 368 -1.309553316 -3.441442477
## 369  3.018441513  0.195145019
## 370  3.287245273  1.862854049
## 371 -1.092973528 -2.491980086
## 372  3.689040844 -1.195941678
## 373  2.850418395  2.461329165
## 374  3.029819765  0.572570689
## 375 -0.231838841 -1.514934369
## 376  0.566623777  1.760547656
## 377  2.564650051 -0.245965246
## 378 -2.778506161 -0.768933886
## 379  1.556217569  0.874371512
## 380 -0.949878801 -2.041007913
## 381  2.678980373  2.399816990
## 382 -1.141054517 -2.848267717
## 384 -0.804529963 -1.941868063
## 385 -0.471834857 -1.248122354
## 386  3.472913286 -0.066192399
## 387  1.346109484  1.006045230
## 388 -1.205961223 -2.556082442
## 389 -3.020333830 -0.006379024
## 390  2.759365149  2.368590028
## 392  3.362496705 -2.524641325
## 394 -2.863762916 -0.349315099
## 395 -2.947138633 -0.283836579
## 396 -3.654249724  1.763249537
## 397  3.735705272 -1.117039434
## 398 -2.867989963 -0.204074251
## 400 -3.468395334  1.821560814
## 401  2.600974541  2.333768135
## 402 -1.493926303 -4.203024126
## 403  2.984674596  2.390897222
## 404  3.418962519  0.239816024
## 405  3.764579381 -1.249516715
## 406  3.925887210 -2.065013067
## 407  3.660118940 -2.329930529
## 408  2.438012430 -0.440205225
## 409 -0.934453169 -1.915701760
## 410  2.562789197 -0.334362009
## 414 -2.890243991 -0.409852057
## 415  3.654589200  0.688585343
## 416 -1.704439460 -4.195602632
## 417 -2.291005020  0.458808195
## 418  3.578700413 -0.013315386
## 419 -0.423522737  0.682356274
## 420  2.208026438  0.307327841
## 421 -1.729019015 -3.534408048
## 422 -1.171915858 -2.526023415
## 423 -0.793218896 -0.904526431
## 424 -3.716930355  1.920600018
## 425  3.474612214 -2.445053444
## 427  2.369909483  2.334687193
## 428 -3.422386553  1.242053801
## 429 -3.636938678  1.733064435
## 430 -1.565711894 -1.938226653
## 431  2.394525831  2.030820741
## 432  2.832507126  2.493767229
## 433  2.544254668 -0.361207507
## 434 -2.942760947 -0.312669500
## 436  3.562067606 -0.841240839
## 437 -2.777309901 -0.786365012
## 438  2.523440506  2.179272283
## 439 -0.460263328 -0.903506392
## 440  3.561892335 -2.401974528
## 441 -1.215275353 -3.309439931
## 442  2.037437126  2.215974662
## 443 -0.587727006 -1.276305112
## 444 -1.160693815 -3.401632037
## 445 -0.471960797  1.083173899
## 446 -3.345419255  1.606772334
## 449  0.521096661  0.455489667
## 450 -2.886297094 -0.114664224
## 451  2.464001157  2.123576589
## 452 -0.017427356  0.869663403
## 453 -3.252699403  1.040545758
## 454  3.733946286  1.238655095
## 455 -4.044614400  1.693989343
## 457 -0.362536422  0.299692258
## 458 -3.531230968  1.183982279
## 459 -2.170943159  0.529594004
## 460  3.374732063 -0.054855874
## 461  0.275664896  0.446831523
## 462  0.171219914  0.986885339
## 463 -3.244444208  0.768341321
## 464 -3.208989961  0.823557244
## 465 -3.682561815  1.393534881
## 466 -1.467629967 -4.068842475
## 467 -1.503582198 -4.049027278
## 468 -3.124805194  1.021920352
## 469  0.055980710  1.043487199
## 470  2.608804435 -0.210107882
## 471 -1.356586681 -3.974294633
## 472 -1.444968158 -2.384329525
## 474 -3.559047500  1.233155698
## 475 -2.992578758 -0.125487533
## 476 -1.135469575 -1.108756637
## 477 -2.534380196 -1.224746602
## 478 -1.500826912 -2.028659417
## 479  0.815423494  1.174725715
## 480  0.095895243  1.092742473
## 484  2.526164374 -0.274168017
## 485  3.705927033 -0.384013711
## 486 -1.357050012 -2.286415177
## 488  2.331191214  0.008881860
## 490 -0.525750675  0.334654145
## 491 -0.394380427  0.339122554
## 492 -1.484589478 -1.007742495
## 493 -1.259135205 -3.366328032
## 494 -2.707929437 -0.979743864
## 495  3.382231816  0.091969800
## 497 -0.245578680  0.809365055
## 498  2.291991224 -0.060221310
## 499  0.141209377  0.462273715
## 500  3.755063737 -2.221207166
## 501  0.382514432  0.279591372
## 502 -0.084348751  1.001019140
## 503  3.530085104  0.393808079
## 504 -4.207915418  1.540461754
## 505 -2.253010527  0.500008454
## 507  3.315755289  2.059095522
## 508  3.932286144 -1.831736265
## 509  0.686304174  0.505306907
## 511 -0.755387436 -0.766792630
## 512  0.376696507  0.256131656
## 513  1.716134912  0.130771154
## 514 -1.855169428  0.406690218
## 515  3.890385546 -2.133242350
## 516 -3.531011983  1.054004408
## 517 -3.013925345 -0.227311921
## 518  3.490244637  0.027269727
## 519 -1.273724538 -1.873490512
## 522 -1.579701861 -2.002179511
## 523  2.286982615 -0.245120555
## 524  0.685581367  1.031506730
## 525  2.544283290 -0.223461705
## 526 -3.528339777  1.022167826
## 527 -1.638278408 -0.934576835
## 528  3.616410656  0.648976831
## 529 -1.882131089 -2.917179776
## 530 -0.988478226 -0.178879866
## 531  3.810754716 -2.285057857
## 532  0.116232747  1.076992852
## 533  3.484724876  0.177720905
## 534 -1.413597920 -3.523305322
## 535 -1.707225978 -1.111033717
## 536 -1.315901358 -1.970376385
## 537 -3.622240284  1.182096495
## 538 -0.918394980 -3.474191622
## 539 -0.020700236  0.271371238
## 541  3.923541004 -1.952870788
## 542 -1.485144341 -2.532474455
## 543  3.778293531  1.179286349
## 545 -0.878452535 -3.285149536
## 546 -1.978645545 -2.071590394
## 547 -1.821246170  0.344482202
## 548  3.614114391  0.958650295
## 550 -1.908593677  0.243459231
## 551 -1.741405034 -2.000065723
## 555  3.634610898  0.691347309
## 558 -4.218366859  1.575844201
## 560  0.903312934  0.945743765
## 561 -1.515973796 -2.418101954
## 563 -3.680875765  1.198658132
## 564  3.523782881 -0.078043745
## 566  2.124707484 -0.123975978
## 568  3.894554302 -2.087549584
## 569  0.711839093  0.491796187
## 571 -1.544853966 -0.804411188
## 572 -1.980928685 -2.370716634
## 573 -1.286346628 -0.551615527
## 574  3.794848587  1.052843223
## 575 -1.379418967 -0.674845497
## 578 -1.374713991 -0.171037469
## 579 -1.410602639  0.234432495
## 580 -0.863635964 -3.042830792
## 581  0.838839092  0.216694356
## 583  2.148982512 -0.331996750
## 584 -0.984684610 -3.494494877
## 585 -2.421121890 -1.296209987
## 586 -4.155416004  1.514029059
## 587 -3.851824510  1.320269420
## 588 -0.971082856 -3.531148925
## 590 -1.338903159 -3.941312306
## 591 -3.840897356  1.339454956
## 592 -1.404921033 -0.354049031
## 593 -0.185967525  0.932972932
## 594  3.785425535  1.158577729
## 597 -0.997156785 -0.355397369
## 599 -2.161236294 -1.655566701
## 600  3.743714397 -0.737965758
## 601  3.617450072  1.480372846
## 602 -3.787531524  1.358865811
## 603 -2.032468333 -2.040552432
## 604 -1.364068491 -3.976463752
## 605  1.067236731  0.119960265
## 606 -1.954972299  0.347197865
## 608  0.082625802 -0.052679329
## 609 -1.138782051 -0.442852376
## 610  0.042189668 -0.018195522
## 611 -1.453414244 -2.538131046
## 613  1.209398399  0.079788493
## 615  1.223365877 -0.027132653
## 616 -1.630603790 -0.773124760
## 619  3.818839069  1.074839649
## 620  3.565894234  0.044563351
## 622 -1.244353807 -3.909903209
## 623 -1.857246127 -1.458312820
## 624 -1.897906920 -2.197360557
## 625 -4.297914749  1.471645260
## 626  0.828812902  0.784727774
## 628 -1.483648147 -0.006400111
## 629 -4.308595342  1.485468815
## 630 -1.677789078 -2.410925904
## 631 -4.292162521  1.481493771
## 632 -1.573767427 -1.584581826
## 634 -1.034269921 -0.515924168
## 636 -0.906312462 -3.462935749
## 638  3.722137975  0.860634742
## 641  0.692164409  0.495783902
## 642 -2.182223440 -1.887052888
## 643  3.634396236  1.242163453
## 647  3.577877550  0.535062918
## 648  0.596802660  0.201013541
## 649 -1.937503310 -1.501323376
## 650 -1.230284202 -0.533738996
## 652  3.730493291  0.842394866
## 661 -1.704134466 -2.535220735
## 662 -1.192556453 -3.786599422
## 664  1.710865587  0.039829904
## 666 -4.295470050  1.466734625
## 667  3.374602342 -0.594264695
## 671 -1.296840102 -2.488335138
pca_100 <- perform_pca(data_clean, 'bwt_100')
pca_100
## Importance of components:
##                           PC1    PC2     PC3     PC4     PC5     PC6     PC7
## Standard deviation     1.9254 1.1503 1.07384 1.02810 0.95159 0.92141 0.84454
## Proportion of Variance 0.3089 0.1103 0.09609 0.08808 0.07546 0.07075 0.05944
## Cumulative Proportion  0.3089 0.4192 0.51530 0.60339 0.67884 0.74959 0.80903
##                            PC8     PC9    PC10    PC11    PC12
## Standard deviation     0.81575 0.73003 0.69914 0.59720 0.49779
## Proportion of Variance 0.05545 0.04441 0.04073 0.02972 0.02065
## Cumulative Proportion  0.86449 0.90890 0.94963 0.97935 1.00000
umap_100 <- perform_umap(data_clean, 'bwt_100')
umap_100
##             [,1]         [,2]
## 2   -0.214306448 -3.947785635
## 4   -0.705589452 -4.441633588
## 5    2.065682762  3.665941153
## 7   -0.021561143 -3.656894425
## 10   0.475438934  1.000447931
## 11   0.860888101 -2.341927967
## 13   2.191097786 -0.998849987
## 14   0.800645085  1.288005869
## 15   2.148079283  2.464043331
## 16   2.388010149  4.037636992
## 17   0.360129017  0.123260007
## 19   0.592838348 -2.323767641
## 20  -0.083525761 -3.669438398
## 21   2.034261590  2.641907666
## 22   2.254217934 -1.014397878
## 23   3.965507992 -0.263656663
## 25   1.071496974 -3.055047031
## 27   2.437017582  3.871807913
## 28   2.306989765  3.980654619
## 29   1.049063783 -1.610519849
## 30   1.031054648 -3.130462581
## 31   2.116806497  2.596123450
## 32   2.274015447  4.019923087
## 35  -0.582856370 -4.193875425
## 36   0.538307397  0.872321928
## 40   2.477104410  3.866829595
## 41  -0.636625543 -4.281986894
## 42   0.780062270 -2.930520322
## 43  -0.160630950 -3.757898327
## 45   2.063650452  2.462526870
## 46   2.383588416 -0.775852878
## 47  -0.811333702 -4.470322275
## 48  -0.824132057 -4.473601044
## 50   2.222707652 -0.953474177
## 51   0.032850405 -3.102781153
## 53   1.240398192 -2.073294040
## 54   2.082354946  2.882833699
## 55   3.893814086 -0.618568384
## 56   0.575673704 -2.250553234
## 57   2.078373460  2.395926401
## 58  -0.178980507 -3.817869531
## 59   1.741721099 -1.752870193
## 62   0.896596237 -1.991448422
## 65   2.026821970  2.480630425
## 66   2.727159075 -0.731749520
## 67   2.433603374  3.781573795
## 68   0.896515036 -2.339736776
## 69   0.932694135 -2.641134668
## 70   2.328699755 -0.788689255
## 72  -0.653637313 -4.276119200
## 74  -1.254082147 -3.731624036
## 75   0.872144735 -2.603486928
## 76   0.895981949  1.569625441
## 77   2.246869273  3.866366088
## 78   3.793191982 -0.087809291
## 80   0.811920798 -2.209387406
## 81  -0.644857587 -4.387363115
## 82   2.130480208  2.505598244
## 83   0.480289398 -3.259280397
## 84   2.289336313  3.578949442
## 85   0.885933662 -2.645213337
## 86  -0.258930995 -3.881546405
## 87   1.749771654 -1.679183056
## 88   2.156109069  4.071752665
## 91   0.938470285 -3.157549693
## 92   0.868277029 -2.615310668
## 94   4.268842686 -0.791577341
## 95   1.033846795 -1.902528276
## 97   0.577624401  1.036507429
## 98   0.414822187 -2.324097339
## 99   0.849801699 -3.055857981
## 101  3.593619107 -0.442591731
## 102  0.886666276 -2.612839149
## 103  3.807523570 -0.183248752
## 104 -0.745978232 -4.326193992
## 105 -0.615315087 -4.235692809
## 107  1.735744592 -1.707382466
## 108  0.384499638  0.454555075
## 109  0.566462374 -2.310412263
## 111  2.122058268 -0.867024357
## 114  2.358413148  3.732244693
## 115 -0.462879338 -3.497688317
## 116 -0.269409350 -3.159469229
## 117  2.006478106  3.632809303
## 118  0.772287673 -2.739440483
## 119  1.960310659 -1.259868930
## 120  0.952308285 -2.288443248
## 121  2.135820066 -0.865911487
## 122 -0.643416803 -4.188203371
## 124 -0.360922913 -3.801354853
## 125  1.992684564  2.586894829
## 126  1.984389102  2.491866566
## 127  0.645386507 -2.145903440
## 128  1.765512054 -1.414516732
## 129  0.648414089 -3.083700057
## 130  2.283769231 -0.271632026
## 131  2.200777746  4.281645328
## 132  2.150554340 -0.744405522
## 133  2.233909229  3.869667797
## 134  1.983768987 -1.177789816
## 137  1.085854090 -3.180150660
## 139  0.473378674  1.031927623
## 140  1.870795779  3.070388348
## 141  3.851850224 -0.143060236
## 143 -0.827331918 -4.212724954
## 144 -0.886416193 -4.255873643
## 145  1.862567132  4.179337110
## 146  2.292555166 -0.048303248
## 148  1.759283036  2.727074066
## 149  0.285509600  0.296318167
## 150  2.617129050 -0.121020151
## 151  4.420174529 -0.717882478
## 152  0.048650845 -3.470892467
## 153  1.665390236 -1.495598235
## 154  0.823178963  1.215134615
## 155 -0.666341774 -3.931224822
## 156  1.692739799 -1.459961068
## 157  1.847265823 -1.289895038
## 159  0.006512767 -3.123811721
## 160  2.328119560 -0.793869355
## 161  1.818099102  2.427330223
## 162  2.156722255  3.616004972
## 163  1.886436083  2.455796872
## 164  1.874598714 -0.927268236
## 165  0.619873436 -2.837476866
## 166  1.706008326 -1.396267734
## 167  2.110773888 -0.683913176
## 168 -0.580930475 -3.515513350
## 169 -0.367031752 -3.505829439
## 170  1.826532077  2.181935657
## 172  2.256501995  3.735372174
## 173  1.484805483 -0.969487075
## 174  1.229283770  1.578782910
## 176  1.149521082  1.644977212
## 177  1.252644415 -2.101793058
## 179  2.220309126 -0.030600897
## 180  1.715424712  2.804093423
## 182  2.243394150 -0.030152223
## 183  1.928419142  4.304222884
## 184  1.938224836 -0.287211659
## 185  0.952004923  1.267040156
## 186 -0.262756461 -1.953398451
## 187  1.190475301  1.566503536
## 188  1.036502313 -3.228982970
## 189  3.991121024 -0.129181586
## 190 -1.252542655 -4.150265676
## 191  1.112764293 -3.221508413
## 192  2.155476227  4.260164670
## 193  0.002651700  1.392077863
## 194  1.845537818  3.795498256
## 195  2.104171274  3.745286086
## 196 -0.403410673 -1.822335836
## 197  0.348296145  0.701114017
## 198  0.328196880 -1.070689533
## 199  1.651273059 -0.882613390
## 201 -1.063489976 -3.477558822
## 202 -0.044601339 -0.513006540
## 203  4.709022297 -0.781997970
## 205 -0.776473126 -3.321721996
## 206  1.574149247  3.394190022
## 207 -0.179007875 -3.583262287
## 208  1.580603543 -1.393952346
## 210 -0.398471164 -1.827195393
## 211  1.812630470 -0.760803970
## 212 -0.711295809 -3.071853996
## 213  1.868037533  4.153576602
## 215  0.875029165  1.593847139
## 216  1.037378465  1.362739870
## 217  1.602852122  3.937400912
## 218  3.884879715 -0.218854214
## 219  0.246165782  0.655053965
## 220  0.956454688 -3.268511440
## 221  2.062025804  0.319613349
## 222 -0.039735829  1.229840368
## 223 -0.272715346 -1.405790035
## 224  4.673029854 -0.401037986
## 225 -1.366276634 -3.606942203
## 226  1.636625716  3.653826809
## 227  1.271284017  2.855354682
## 228 -0.273641089 -1.390118259
## 229  2.195282578 -0.020771290
## 230 -0.198979478 -0.119364858
## 231 -2.234507747 -4.121408079
## 232 -0.003056894  0.183418145
## 233 -2.261557119 -4.140513119
## 234  1.963512248  4.285448436
## 235 -0.641793859 -1.746294440
## 236  1.182485643  1.672893979
## 237  2.166752505 -0.065788125
## 238  1.951426165  4.600594752
## 239  1.525252303  3.931906790
## 240  1.700768733  4.091794858
## 241  1.060996677  2.759914749
## 242  0.323240140 -1.156582936
## 243 -0.010942247  0.082423352
## 244  4.500678348 -0.815642796
## 245  2.098834368  5.912447354
## 246 -1.418857255 -3.579386133
## 247  1.891185704  5.038633461
## 248  2.255957831 -0.060875769
## 249  1.444554629  3.791232952
## 250 -1.324906144 -3.384992687
## 251  0.816030493  2.745139249
## 253 -1.574136910 -3.405777450
## 255  0.087089399  0.244729188
## 256 -1.558397247 -3.565811875
## 257 -2.449902593 -4.023999781
## 259 -0.255850864  0.032020267
## 260 -0.249394838 -0.209050062
## 261  4.611087109 -0.642803489
## 262 -2.289925454 -4.093304507
## 263  0.689343535 -1.090696612
## 264 -0.909156032 -2.781197983
## 265 -2.158103905 -4.028679455
## 267 -0.079896836  0.117759094
## 268 -0.580100703 -1.468130573
## 269 -1.425683791 -3.231711867
## 270  1.470497995  4.071567397
## 271  1.040116343  1.104929838
## 272  0.886200441 -1.071244953
## 273 -0.205449215 -1.258048800
## 274 -1.120274275 -2.306168566
## 275 -0.079545861  1.329500070
## 276  4.584353483 -0.707691882
## 277  1.400153551  4.045123382
## 278 -0.835297422 -1.756264307
## 279  1.863419278  4.958973999
## 280 -2.358847759 -1.597963067
## 281 -1.130103781 -2.231070171
## 282 -0.779059210 -1.699792249
## 284 -0.196503983 -0.255289316
## 285  0.346458673  1.600734856
## 286 -2.788388565 -4.087548325
## 287  0.522335735  3.065031735
## 288 -0.326849417 -0.193087027
## 289 -1.424355955 -2.883495402
## 290  2.112344986 -0.059283550
## 292 -0.394752486 -0.837444017
## 295  0.440905012 -1.035526436
## 296  4.651615409 -0.854527488
## 297  4.636858717 -1.042746740
## 298  0.368009839  2.968640269
## 299 -1.360401480 -2.590627934
## 300 -0.274062252  1.287284630
## 301  4.516914891 -1.057465337
## 302 -2.091194002 -3.629495570
## 303 -2.700977579 -4.008940882
## 304  5.023556746 -0.702219634
## 306 -2.097991671 -3.520791586
## 307 -2.127585016 -3.681293531
## 308  1.739078744  5.013975422
## 309 -0.113564645 -1.211814166
## 310  4.365032645 -1.168279659
## 314  1.133169857  4.059055068
## 315 -0.642115915 -1.305946249
## 316 -0.133723720  0.141594552
## 318 -0.283140406 -0.082983115
## 319 -1.874422507 -3.351095170
## 320 -2.834842470 -4.067759342
## 321  0.275461065  2.756711925
## 322  0.828782182  3.925446345
## 323  2.752472490 -0.047929992
## 325 -0.331717426 -0.023314948
## 326 -0.833879873 -1.327183674
## 328  5.093891643 -0.893546875
## 329 -1.197057320 -2.226203382
## 330 -0.798523832 -1.353585861
## 331  1.412340849  4.847810360
## 332  0.279850233  3.198641940
## 333  0.443081297 -0.942378501
## 334  4.791827186 -0.862597218
## 335  0.154094050  3.085312801
## 336 -2.759520159 -4.034773284
## 337 -1.242947083 -2.033142499
## 340 -2.397087606 -1.706149836
## 341 -0.712748385 -0.009309389
## 342  4.929237360 -0.387262536
## 343  5.167767151 -0.214589568
## 344 -1.604565780 -3.230197227
## 345 -0.431930763  0.328809306
## 346 -2.848773818 -4.000468447
## 347 -0.093624271  1.422229208
## 348 -0.195638714  1.439270224
## 350  1.814248090  5.291991337
## 352  2.080908251  5.985257969
## 353  0.169975663  2.943242216
## 354  5.148530581 -0.311251252
## 355 -2.323456217 -1.597423214
## 356  4.309902118 -1.236854622
## 357  0.215609653  1.604365232
## 358  0.938091029  4.230593699
## 360  0.762539142  3.939069284
## 361 -1.076281093 -1.717974796
## 362 -1.838869627 -3.395126674
## 363  2.058385591  6.006442075
## 364  4.452449000 -1.092479643
## 365 -1.819582754 -3.350834779
## 366 -3.018231562 -3.520231789
## 367 -2.744401590 -3.909282109
## 368 -0.773162713 -0.562656676
## 369  0.668110617  3.835161220
## 370  1.992445251  5.828237063
## 371 -0.771646762 -0.674833385
## 372  1.775283279  5.476414024
## 373  1.168409613  5.401088972
## 374  4.988036752 -0.423892267
## 375 -2.780648259 -1.181057473
## 376 -2.336895015 -1.466441915
## 377  4.955131997 -0.868907808
## 378 -3.257152502 -4.012473730
## 379  0.041788945  2.995334168
## 380 -0.126092373  1.501090079
## 381  4.732519164 -0.769034828
## 382 -0.851462566 -0.792761503
## 384 -1.100873837 -1.326466819
## 385 -1.013095651 -1.015537041
## 386  1.388811503  5.570300916
## 387 -0.039366376  2.900369002
## 388 -3.063899797 -1.954645778
## 389 -2.967676190 -3.961755977
## 390  0.941655229  3.989319997
## 392 -0.204303898  3.261611803
## 394 -2.942598502 -3.728223148
## 395 -3.068181458 -3.931179441
## 396 -0.751227662  0.527713796
## 397  5.288525160 -0.136149269
## 398 -0.399454143  1.310777361
## 400 -3.207070226 -2.580314244
## 401  0.782683298  4.170994096
## 402 -3.200361523 -2.640248343
## 403  1.346980383  5.261096461
## 404  5.133146724 -0.249495529
## 405  2.077986573  6.045884899
## 406  5.315317970  0.120917749
## 407  5.337455814 -0.718378107
## 408  5.225735762 -0.801057151
## 409 -2.869828834 -1.737245174
## 410  4.848275253 -0.899921172
## 414 -3.271071398 -3.665695835
## 415  2.083110475  6.001444052
## 416 -3.309035391 -3.787677531
## 417 -0.316136832  1.432950215
## 418  1.979539649  6.039858186
## 419 -0.967238863  0.126037840
## 420  5.210601972 -0.835855288
## 421 -0.814310058  0.184527091
## 422 -3.210957232 -1.867675921
## 423 -3.068608073 -1.762148888
## 424 -3.235997496 -3.907302142
## 425 -0.351509244  3.327587464
## 427 -0.226540998  3.529939269
## 428 -3.685155057 -2.463655277
## 429 -0.710131943  0.336459629
## 430 -0.404361949  1.388677827
## 431  5.257022736 -0.712608455
## 432  1.194353397  5.339004567
## 433 -0.380412320  3.301599027
## 434 -3.458148091 -4.113879725
## 436  1.597226607  5.705924457
## 437 -3.685620038 -2.600700410
## 438  5.205162316 -0.621297608
## 439 -2.444808767 -0.182537284
## 440 -0.529253710  3.238022652
## 441 -2.542363560 -1.465580522
## 442 -0.490274165  3.381526867
## 443 -2.863875947 -0.820291834
## 444 -3.007165646 -1.042178243
## 445 -2.526830310 -1.458493718
## 446 -3.618005995 -1.312674946
## 449 -2.339299841  0.052143880
## 450 -3.607269072 -2.996486909
## 451  1.214356371  5.201364416
## 452 -1.763198020  1.845085702
## 453 -3.470264940 -3.953785864
## 454  5.352393732  0.083960478
## 455 -3.271695011 -1.759924884
## 457 -2.918095187 -1.134969786
## 458 -0.701682923  0.864082188
## 459 -3.377222601 -1.754942333
## 460  1.267766754  5.462357632
## 461 -0.941542826  2.980991403
## 462 -1.581715076  2.167614357
## 463 -0.629772326  0.239760403
## 464 -3.452610816 -4.032305152
## 465 -0.740516637  0.635620266
## 466 -3.593922903 -3.069839821
## 467 -3.697756140 -2.420284737
## 468 -3.750964483 -1.844155894
## 469 -2.317342634  0.846669718
## 470 -0.609354004  3.377047060
## 471 -3.348591502 -2.403231415
## 472 -3.335629682 -1.755030070
## 474 -3.690289243 -3.499537927
## 475 -3.580885968 -3.586735392
## 476 -2.372531322  0.388606176
## 477 -3.696305607 -3.672462145
## 478 -1.369294736  0.249769654
## 479 -2.255747143 -1.091990123
## 480 -2.732844035 -1.239142851
## 484 -0.384751674  3.068773099
## 485  5.269030819 -0.174188122
## 486 -2.646885132 -1.362413940
## 488  5.343956190 -0.770353439
## 490 -3.259878592 -1.170137874
## 491 -2.936588245 -1.191191483
## 492 -3.663094261 -1.329123843
## 493 -1.403217778  0.285822094
## 494 -3.477286901 -4.006583805
## 495  1.286094483  5.444653274
## 497 -2.584814631  0.280986874
## 498 -0.713167264  3.429409968
## 499 -1.757716409  2.002558613
## 500  5.449807385 -0.691395735
## 501 -1.040172085  3.063872679
## 502 -0.945784607  2.773424876
## 503  5.194885398 -0.307637383
## 504 -3.350499815 -1.562627367
## 505 -3.828621225 -1.756106244
## 507  1.371116330  5.867811349
## 508  1.328445207  5.565251492
## 509 -2.225709341 -0.662004834
## 511 -0.958374670  2.891456383
## 512 -2.568012465  0.054362466
## 513  5.362204039 -0.774033786
## 514 -3.405257507 -1.188529284
## 515  0.955069188  5.137479723
## 516 -3.845157001 -2.082596887
## 517 -3.852761315 -2.087723969
## 518  1.339432435  5.940778135
## 519 -2.924315457 -1.185839080
## 522 -3.725987679 -1.348560671
## 523 -0.987965952  3.195242482
## 524 -1.345769200  2.964806237
## 525 -0.746427996  3.305560322
## 526 -3.890590236 -3.418754657
## 527 -4.004861284 -1.717774498
## 528  1.258993633  6.028516510
## 529 -3.809309127 -3.515144001
## 530 -3.300793560 -1.039742180
## 531 -0.853195597  3.120148423
## 532 -1.508387317  2.488313879
## 533  1.460237004  5.767878047
## 534 -4.051010683 -1.732134851
## 535 -4.068629797 -1.730420233
## 536 -2.747577651  0.400910505
## 537 -3.990444528 -3.232706331
## 538 -2.566045693  0.537479293
## 539 -2.460850039 -1.181367490
## 541  5.344758317 -0.334988292
## 542 -2.817575423  0.045878872
## 543  5.305310625 -0.181347731
## 545 -2.500003613 -0.045723136
## 546 -4.125019269 -1.858035732
## 547 -3.571002667 -0.827895449
## 548  5.382484442  0.181977491
## 550 -0.706852844  1.759080549
## 551 -3.941890537 -1.409549722
## 555  1.465040092  6.062424559
## 558 -4.050702863 -1.727746104
## 560 -0.774044876  3.489556608
## 561 -2.860435987  0.055983847
## 563 -0.740785384  0.883309145
## 564  1.384387399  6.135068645
## 566 -0.960839330  3.299793335
## 568  1.323212219  5.931017006
## 569 -1.259105161  3.115989591
## 571 -3.898841157 -1.278869597
## 572 -4.061875688 -3.259240515
## 573 -3.743169033 -1.339556830
## 574  5.218865018 -0.295996546
## 575 -3.883312099 -1.406038615
## 578 -3.219451447 -0.196612277
## 579 -3.520085799 -0.633090220
## 580 -2.238946123 -0.827380285
## 581 -1.222326060  3.196859380
## 583 -0.908763872  3.393027817
## 584 -1.042304567  2.512471134
## 585 -3.585851053 -4.050874795
## 586 -3.908053556 -1.424969210
## 587 -4.208378119 -1.739543586
## 588 -2.641932771  0.468835782
## 590 -3.994389464 -3.397830185
## 591 -0.623076932  1.208027077
## 592 -3.464693199 -0.714042367
## 593 -1.046500764  2.665309073
## 594  1.366762826  5.593223154
## 597 -2.616767710  0.600349486
## 599 -4.054337880 -3.252529784
## 600  1.639964718  6.115483041
## 601  5.427883821 -0.034709392
## 602 -0.544676073  1.360776298
## 603 -0.828545458  0.759635976
## 604 -4.031626128 -3.338221462
## 605 -1.419722695  2.736873259
## 606 -4.165448144 -1.524353522
## 608 -2.379034606 -0.576733494
## 609 -4.011018773 -1.084770221
## 610 -1.001451030  3.107237691
## 611 -2.735467929  0.094302944
## 613 -1.235166845  3.143898102
## 615 -1.415354222  2.613766921
## 616 -4.204863272 -1.297427162
## 619  1.859559495  6.180238058
## 620  1.469478130  5.852607376
## 622 -4.255379481 -1.681390783
## 623 -4.208045098 -1.679792848
## 624 -4.142524915 -1.140932524
## 625 -3.373814425 -0.327632315
## 626 -2.220436631 -0.747090103
## 628 -2.853505605  0.395351564
## 629 -4.196600253 -2.414088893
## 630 -3.520905729 -0.522501110
## 631 -4.163493225 -1.180841584
## 632 -1.059777512  2.375832027
## 634 -1.326001843  2.557253261
## 636 -2.976575324 -0.018718898
## 638  1.317806826  6.175886657
## 641 -2.329360497 -0.547616796
## 642 -4.115134235 -3.229364958
## 643  1.292088115  6.175836194
## 647  1.602890188  6.134915844
## 648 -2.287530741 -0.794629350
## 649 -3.557470457 -0.514787309
## 650 -2.932287940  0.276550466
## 652  1.203740883  6.216805284
## 661 -4.243507620 -2.188620616
## 662 -4.326298325 -1.550611249
## 664 -1.326971418  2.909469671
## 666 -4.172265632 -1.108485538
## 667  1.207864897  6.131586720
## 671 -1.374800263  3.110835365
ggplot(data.frame(PC1 = pca_original$x[,1], PC2 = pca_original$x[,2]), aes(x = PC1, y = PC2)) + 
  geom_point() + ggtitle("PCA - O")

ggplot(data.frame(PC1 = pca_50$x[,1], PC2 = pca_50$x[,2]), aes(x = PC1, y = PC2)) + 
  geom_point() + ggtitle("PCA - 50% ")

ggplot(data.frame(PC1 = pca_100$x[,1], PC2 = pca_100$x[,2]), aes(x = PC1, y = PC2)) + 
  geom_point() + ggtitle("PCA - 100% ")

ggplot(data.frame(UMAP1 = umap_original[,1], UMAP2 = umap_original[,2]), aes(x = UMAP1, y = UMAP2)) + 
  geom_point() + ggtitle("UMAP - Orig")

ggplot(data.frame(UMAP1 = umap_50[,1], UMAP2 = umap_50[,2]), aes(x = UMAP1, y = UMAP2)) + 
  geom_point() + ggtitle("UMAP - 50% ")

ggplot(data.frame(UMAP1 = umap_100[,1], UMAP2 = umap_100[,2]), aes(x = UMAP1, y = UMAP2)) + 
  geom_point() + ggtitle("UMAP - 100% ")

Честно говоря я не понимаю, что происходит, по визуализации как будто кумулятивная не должна меняться, просто новые кластеры появляются, но общий результат должен быть похожим

Если вам не трудно, могли бы вы в фидбеке обьяснить, как правильно интерпретировать и как делать последние два пункта :) Я сдаюсь…